awk 'BEGIN {FS=","; OFS=","} {if ($36 < 10000000) {tag="0"} else if ($36 < 50000000) {tag="1"} else if ($36 < 100000000) {tag="1"} else if ($36 < 200000000) {tag="4"} else {tag="4"} $36=tag; print }' movies_refine > movies_refine_tagged
#awk 'BEGIN {FS=","; OFS=","} {if ($13 < 0.5) {tag="0"} else if ($13 < 1.0) {tag="1"} else if ($13 < 1.5) {tag="2"} else if ($13 < 2.0) {tag="3"} else {tag="4"} $13=tag; print }' movies_refine_ROI > movies_refine_tagged
awk 'BEGIN {FS=","; OFS=","} {if ($5 != 2014) {print}}' movies_refine_tagged > movies_refine_wo_2014
awk 'BEGIN {FS=","; OFS=","} {if ($5 >= 2010) {print}}' movies_refine_wo_2014 > movies_refine_test
awk 'BEGIN {FS=","; OFS=","} {if ($5 < 2010 && $5 >= 2000) {print}}' movies_refine_wo_2014 > movies_refine_train
